#pragma once
#include <iostream>
#include<vector>
#include<string>
#include<map>
#include <set>
#include<regex>
#include "splitTool.h"
#include <func.h>
#include "cppjieba/Jieba.hpp"
using namespace std;

class WebPage
{
public:
    WebPage(string& content);
    void processDoc();
    map<string,int>& getWordsMap();
    vector<string>& getWords();

private:
    string _content;
    vector<string> _words;   //每个文章有哪些词
    map<string,int> _wordsMap;  //保存每个网页的所有词语和词频
    static SplitTool* _spl;
};
